export CUDA_VISIBLE_DEVICES=7

python triton_matmul.py
